from llama_index.readers.web import SimpleWebPageReader

documents = SimpleWebPageReader(html_to_text=True).load_data(
    ["https://baike.baidu.com/item/%E7%9F%A5%E4%B9%8E%E7%9F%A5%E5%AD%A6%E5%A0%82/64028760"]
)

print(documents[0].text)